import re
from pprint import pprint
model=re.compile('<option value="(.*?)">(.*?)</option>')

def get_raw_refer():
    with open('data2.txt',encoding='utf-8') as f:
        s = f.read().split('\n')
        res = dict()
        for i in s:
            item = model.findall(i)
            if item:
                res[item[0][1]]=item[0][0]

        return res

def get_refer():
    return {
 '上海': '310000',
 '云南': '530000',
 '兵团': '660000',
 '内蒙古': '150000',
 '北京': '110000',
 '吉林': '220000',
 '四川': '510000',
 '天津': '120000',
 '宁夏': '640000',
 '安徽': '340000',
 '山东': '370000',
 '山西': '140000',
 '广东': '440000',
 '广西': '450000',
 '新疆': '650000',
 '江苏': '320000',
 '江西': '360000',
 '河北': '130000',
 '河南': '410000',
 '浙江': '330000',
 '海南': '460000',
 '湖北': '420000',
 '湖南': '430000',
 '甘肃': '620000',
 '福建': '350000',
 '西藏': '540000',
 '贵州': '520000',
 '辽宁': '210000',
 '重庆': '500000',
 '陕西': '610000',
 '青海': '630000',
 '黑龙江': '230000'
    }



if __name__ == "__main__":
    pprint(get_refer())




